#!/bin/sh
. ~/.bashrc
hdfs -rmr streaming/output
hadoop-streaming -D mapred.job.name='Streaming Word Count Sort' -input data/acm-template -output streaming/output -mapper map.py -reducer reduce.py -file map.py -file reduce.py -file conf.py
